\relax 
\citation{cuda}
\citation{opencl}
\citation{DBLP:conf/vldb/BandiSAA04}
\citation{DBLP:conf/sigmod/GovindarajuLWLM04}
\citation{he:primitive}
\citation{cwi:uva}
\citation{jimgray:terasort}
\citation{satish:fastsort}
\citation{he:compression}
\citation{ross:olap}
\citation{DBLP:journals/pvldb/HeY11}
\citation{he:gdb}
\citation{tim:uva}
\citation{DBLP:journals/pvldb/AoZWSWLLL11}
\citation{Haicheng:fusion}
\citation{DBLP:conf/icde/LiebermanSS08}
\citation{DBLP:journals/pvldb/WangHLWZS12}
\citation{DBLP:conf/cidr/StonebrakerBCCGHHLRZ07}
\@writefile{toc}{\contentsline {section}{\numberline {1}Introduction}{\thepage }}
\@writefile{toc}{\contentsline {subsection}{\numberline {1.1}The Framework of Our Study}{\thepage }}
\citation{DBLP:journals/debu/IdreosGNMMK12}
\citation{DBLP:conf/icdcs/LeeLHWHZ11}
\citation{abadi:materialization}
\citation{eth:join}
\citation{yinan:join}
\citation{tim:uva}
\citation{DBLP:journals/tog/AlcantaraSASMOA09}
\citation{DBLP:books/cu/MotwaniR95}
\@writefile{lof}{\contentsline {figure}{\numberline {1}{\ignorespaces Research Overview: A 3-Dimension Study of Processing Warehousing Queries on GPUs.}}{\thepage }}
\newlabel{fig:overview}{{1}{\thepage }}
\@writefile{toc}{\contentsline {subsection}{\numberline {1.2}Contributions of Performance Insights}{\thepage }}
\@writefile{toc}{\contentsline {section}{\numberline {2}GPU Query Engine}{\thepage }}
\@writefile{toc}{\contentsline {subsection}{\numberline {2.1}Engine Structure and Storage Format}{\thepage }}
\@writefile{toc}{\contentsline {subsection}{\numberline {2.2}Query Operators}{\thepage }}
\@writefile{lof}{\contentsline {figure}{\numberline {2}{\ignorespaces GPU Query Engine Architecture}}{\thepage }}
\newlabel{fig:gpudb}{{2}{\thepage }}
\citation{oneil:ssb}
\citation{DBLP:conf/sigmod/AbadiMH08}
\citation{DBLP:journals/pvldb/CandeaPV09}
\citation{amdsdk}
\@writefile{lot}{\contentsline {table}{\numberline {2}{\ignorespaces Hardware Specifications}}{\thepage }}
\newlabel{table:hardware}{{2}{\thepage }}
\@writefile{toc}{\contentsline {subsection}{\numberline {2.3}Implementation Details}{\thepage }}
\@writefile{toc}{\contentsline {section}{\numberline {3}Experimental Methodology}{\thepage }}
\@writefile{toc}{\contentsline {subsection}{\numberline {3.1}Workloads}{\thepage }}
\@writefile{lof}{\contentsline {figure}{\numberline {3}{\ignorespaces Schema of SSBM}}{\thepage }}
\newlabel{fig:starschema}{{3}{\thepage }}
\@writefile{lot}{\contentsline {table}{\numberline {3}{\ignorespaces GPU Bandwidth Measurement}}{\thepage }}
\newlabel{table:bandwidth}{{3}{\thepage }}
\@writefile{toc}{\contentsline {subsection}{\numberline {3.2}Experimental Environments}{\thepage }}
\@writefile{toc}{\contentsline {subsubsection}{\numberline {3.2.1}Hardware Platforms}{\thepage }}
\@writefile{toc}{\contentsline {subsubsection}{\numberline {3.2.2}Software platforms}{\thepage }}
\@writefile{toc}{\contentsline {subsection}{\numberline {3.3}Measurement}{\thepage }}
\@writefile{toc}{\contentsline {subsubsection}{\numberline {3.3.1}Methodology and tools}{\thepage }}
\@writefile{toc}{\contentsline {subsubsection}{\numberline {3.3.2}Measurement of bandwidth}{\thepage }}
\@writefile{lot}{\contentsline {table}{\numberline {1}{\ignorespaces \textbf  {SSBM Summary}. The table lists the major operations and the Filter Factors (FF) for each SSBM query. L represents the fact table lineorder and D, S, C and P represent the four dimension tables: date, supplier, customer and part. }}{\thepage }}
\newlabel{table:workload}{{1}{\thepage }}
\@writefile{lof}{\contentsline {figure}{\numberline {4}{\ignorespaces Baseline of SSBM queries on NVIDIA GTX 680. }}{\thepage }}
\newlabel{fig:ssbbase}{{4}{\thepage }}
\@writefile{toc}{\contentsline {section}{\numberline {4}Performance Analysis}{\thepage }}
\newlabel{sec:software}{{4}{\thepage }}
\@writefile{toc}{\contentsline {subsection}{\numberline {4.1}SSBM Query Behaviors}{\thepage }}
\@writefile{lof}{\contentsline {figure}{\numberline {5}{\ignorespaces SSBM execution time breakdown}}{\thepage }}
\newlabel{fig:ssbbreak}{{5}{\thepage }}
\citation{DBLP:conf/sigmod/AbadiMF06}
\@writefile{lot}{\contentsline {table}{\numberline {4}{\ignorespaces Compression ratio for fact table columns when sorted on different foreign key columns.}}{\thepage }}
\newlabel{table:compression}{{4}{\thepage }}
\@writefile{toc}{\contentsline {subsection}{\numberline {4.2}Effects of data compression}{\thepage }}
\@writefile{toc}{\contentsline {subsection}{\numberline {4.3}Effects of Transfer Overlapping}{\thepage }}
\newlabel{sec:uva}{{4.3}{\thepage }}
\citation{DBLP:conf/sigmod/AbadiMH08}
\newlabel{fig:ssbcompression}{{6(a)}{\thepage }}
\newlabel{sub@fig:ssbcompression}{{(a)}{\thepage }}
\newlabel{fig:uva}{{6(b)}{\thepage }}
\newlabel{sub@fig:uva}{{(b)}{\thepage }}
\newlabel{fig:invisiblejoin}{{6(c)}{\thepage }}
\newlabel{sub@fig:invisiblejoin}{{(c)}{\thepage }}
\@writefile{lof}{\contentsline {figure}{\numberline {6}{\ignorespaces Effects of different software optimization techniques}}{\thepage }}
\@writefile{lof}{\contentsline {subfigure}{\numberline{(a)}{\ignorespaces {Speedup of data compression}}}{\thepage }}
\@writefile{lof}{\contentsline {subfigure}{\numberline{(b)}{\ignorespaces {Speedup of transfer overlapping}}}{\thepage }}
\@writefile{lof}{\contentsline {subfigure}{\numberline{(c)}{\ignorespaces {Speedup of invisible join}}}{\thepage }}
\newlabel{fig:breakdown}{{6}{\thepage }}
\@writefile{toc}{\contentsline {subsection}{\numberline {4.4}Effects of Invisible Join}{\thepage }}
\newlabel{sec:invisible}{{4.4}{\thepage }}
\@writefile{toc}{\contentsline {section}{\numberline {5}Performance Comparison}{\thepage }}
\newlabel{sec:comparison}{{5}{\thepage }}
\@writefile{toc}{\contentsline {subsection}{\numberline {5.1}Comparisons of GPU and CPU}{\thepage }}
\newlabel{sec:cpugpu}{{5.1}{\thepage }}
\citation{nvidiaopencl}
\@writefile{lof}{\contentsline {figure}{\numberline {7}{\ignorespaces SSBM performance comparison. For the performance on Intel Core i7, the performance of Q4.1 and Q4.2 are the performance on OpenCL engine while the rest are the performance on MonetDB.}}{\thepage }}
\newlabel{fig:overall}{{7}{\thepage }}
\@writefile{lof}{\contentsline {figure}{\numberline {8}{\ignorespaces SSBM performance speedup}}{\thepage }}
\newlabel{fig:speedup}{{8}{\thepage }}
\@writefile{toc}{\contentsline {subsubsection}{\numberline {5.1.1}Data are available in the pinned memory}{\thepage }}
\@writefile{toc}{\contentsline {subsubsection}{\numberline {5.1.2}Data are available in the pageable memory}{\thepage }}
\@writefile{toc}{\contentsline {subsection}{\numberline {5.2}Impacts of programming models and GPU hardwares}{\thepage }}
\@writefile{toc}{\contentsline {subsubsection}{\numberline {5.2.1}Comparisons of CUDA and NVIDIA OpenCL}{\thepage }}
\newlabel{sec:cudaopencl}{{5.2.1}{\thepage }}
\citation{DBLP:journals/pc/DuWLTPD12}
\citation{DBLP:journals/pc/DuWLTPD12}
\@writefile{lof}{\contentsline {figure}{\numberline {9}{\ignorespaces Normalized OpenCL performance over CUDA}}{\thepage }}
\newlabel{fig:openclbreakpageable}{{9}{\thepage }}
\@writefile{lof}{\contentsline {figure}{\numberline {10}{\ignorespaces NVIDIA Versus AMD}}{\thepage }}
\newlabel{fig:nvidiaamd}{{10}{\thepage }}
\@writefile{toc}{\contentsline {subsubsection}{\numberline {5.2.2}Comparisons of NVIDIA and AMD GPUs}{\thepage }}
\newlabel{sec:nvidiaamd}{{5.2.2}{\thepage }}
\@writefile{lof}{\contentsline {figure}{\numberline {11}{\ignorespaces Normalized SSBM performance on AMD GPU}}{\thepage }}
\newlabel{fig:amdBreak}{{11}{\thepage }}
\@writefile{toc}{\contentsline {subsection}{\numberline {5.3}Comparisons of OpenCL query engine on CPU with MonetDB}{\thepage }}
\newlabel{sec:cpus}{{5.3}{\thepage }}
\@writefile{lof}{\contentsline {figure}{\numberline {12}{\ignorespaces SSBM performance comparison on CPU}}{\thepage }}
\newlabel{fig:openclMonet}{{12}{\thepage }}
\@writefile{toc}{\contentsline {section}{\numberline {6}Model and Prediction}{\thepage }}
\@writefile{toc}{\contentsline {subsection}{\numberline {6.1}Model Methodology}{\thepage }}
\@writefile{toc}{\contentsline {subsection}{\numberline {6.2}Cost Model for Join}{\thepage }}
\@writefile{lot}{\contentsline {table}{\numberline {5}{\ignorespaces Notations for the Cost Model}}{\thepage }}
\newlabel{table:notation}{{5}{\thepage }}
\newlabel{fig:modeljoin1}{{13(a)}{\thepage }}
\newlabel{sub@fig:modeljoin1}{{(a)}{\thepage }}
\newlabel{fig:modeljoin2}{{13(b)}{\thepage }}
\newlabel{sub@fig:modeljoin2}{{(b)}{\thepage }}
\newlabel{fig:modeljoin3}{{13(c)}{\thepage }}
\newlabel{sub@fig:modeljoin3}{{(c)}{\thepage }}
\newlabel{fig:modeljoin6}{{13(d)}{\thepage }}
\newlabel{sub@fig:modeljoin6}{{(d)}{\thepage }}
\@writefile{lof}{\contentsline {figure}{\numberline {13}{\ignorespaces Evaluate join model for different query characteristics}}{\thepage }}
\@writefile{lof}{\contentsline {subfigure}{\numberline{(a)}{\ignorespaces {Selectivity (\%)}}}{\thepage }}
\@writefile{lof}{\contentsline {subfigure}{\numberline{(b)}{\ignorespaces {\# of fact columns}}}{\thepage }}
\@writefile{lof}{\contentsline {subfigure}{\numberline{(c)}{\ignorespaces {\# of dim columns}}}{\thepage }}
\@writefile{lof}{\contentsline {subfigure}{\numberline{(d)}{\ignorespaces {Dim column width}}}{\thepage }}
\newlabel{fig:evaljoin}{{13}{\thepage }}
\@writefile{lof}{\contentsline {figure}{\numberline {14}{\ignorespaces Error rate of estimated performance on 680. }}{\thepage }}
\newlabel{fig:evalssb}{{14}{\thepage }}
\@writefile{toc}{\contentsline {subsection}{\numberline {6.3}Model Evaluation}{\thepage }}
\citation{DBLP:conf/vldb/BandiSAA04}
\citation{DBLP:conf/sigmod/GovindarajuLWLM04}
\citation{he:primitive}
\citation{cwi:uva}
\citation{jimgray:terasort}
\citation{satish:fastsort}
\citation{he:compression}
\citation{ross:olap}
\citation{DBLP:journals/pvldb/HeY11}
\citation{he:gdb}
\citation{tim:uva}
\citation{DBLP:journals/pvldb/WangHLWZS12}
\citation{DBLP:journals/pvldb/AoZWSWLLL11}
\citation{Haicheng:fusion}
\citation{DBLP:conf/icde/LiebermanSS08}
\citation{he:compression}
\citation{tim:uva}
\citation{cwi:uva}
\citation{he:gdb}
\citation{cuda:memory}
\@writefile{lof}{\contentsline {figure}{\numberline {15}{\ignorespaces Normalized kernel execution time on GTX 480}}{\thepage }}
\newlabel{fig:modelnorm}{{15}{\thepage }}
\@writefile{lof}{\contentsline {figure}{\numberline {16}{\ignorespaces Estimated SSBM performance with different GPU hardware configurations}}{\thepage }}
\newlabel{fig:modelpredict}{{16}{\thepage }}
\@writefile{toc}{\contentsline {subsection}{\numberline {6.4}Impacts of hardware advancement}{\thepage }}
\@writefile{toc}{\contentsline {section}{\numberline {7}Other related Work}{\thepage }}
\@writefile{toc}{\contentsline {section}{\numberline {8}Conclusions}{\thepage }}
\bibstyle{abbrv}
\bibdata{vldb_2013}
\bibcite{amdsdk}{1}
\bibcite{cuda}{2}
\bibcite{cuda:memory}{3}
\bibcite{opencl}{4}
\bibcite{nvidiaopencl}{5}
\bibcite{abadi:materialization}{6}
\bibcite{DBLP:conf/sigmod/AbadiMF06}{7}
\bibcite{DBLP:conf/sigmod/AbadiMH08}{8}
\bibcite{DBLP:journals/tog/AlcantaraSASMOA09}{9}
\bibcite{DBLP:journals/pvldb/AoZWSWLLL11}{10}
\bibcite{eth:join}{11}
\bibcite{DBLP:conf/vldb/BandiSAA04}{12}
\bibcite{yinan:join}{13}
\bibcite{DBLP:journals/pvldb/CandeaPV09}{14}
\bibcite{DBLP:journals/pc/DuWLTPD12}{15}
\bibcite{he:compression}{16}
\bibcite{jimgray:terasort}{17}
\bibcite{DBLP:conf/sigmod/GovindarajuLWLM04}{18}
\bibcite{he:gdb}{19}
\bibcite{he:primitive}{20}
\bibcite{DBLP:journals/pvldb/HeY11}{21}
\bibcite{DBLP:journals/debu/IdreosGNMMK12}{22}
\bibcite{tim:uva}{23}
\bibcite{DBLP:conf/icdcs/LeeLHWHZ11}{24}
\bibcite{DBLP:conf/icde/LiebermanSS08}{25}
\bibcite{DBLP:books/cu/MotwaniR95}{26}
\bibcite{oneil:ssb}{27}
\bibcite{cwi:uva}{28}
\bibcite{satish:fastsort}{29}
\bibcite{ross:olap}{30}
\bibcite{DBLP:conf/cidr/StonebrakerBCCGHHLRZ07}{31}
\bibcite{DBLP:journals/pvldb/WangHLWZS12}{32}
\bibcite{Haicheng:fusion}{33}
\@writefile{toc}{\contentsline {section}{\numberline {9}Acknowledgments}{\thepage }}
\@writefile{toc}{\contentsline {section}{\numberline {10}References}{\thepage }}
